
# [num_episode, num_agent, episode_length, *step_shape]
# (g, o, a, r, d, ava)
toy_example = [
    [
        [([0, 0, 0], [0, 0], [0], [1], False, [1, 1]), ([0, 0, 1], [0, 1], [1], [1], True, [1, 1]),
         ([0, 0, 2], [0, 2], [0], [1], True, [1, 1])],
        [([0, 1, 0], [0, 0], [0], [1], False, [1, 1]), ([0, 1, 1], [0, 1], [1], [1], False, [1, 1]),
         ([0, 1, 2], [0, 2], [0], [1], True, [0, 0])],
        [([0, 2, 0], [0, 0], [0], [1], False, [1, 1]), ([0, 2, 1], [0, 1], [1], [1], False, [1, 1]),
         ([0, 2, 2], [0, 2], [0], [1], True, [0, 0])]
    ],
    [
        [([1, 0, 0], [0, 0], [0], [1], False, [1, 1]), ([1, 0, 1], [0, 1], [1], [1], True, [1, 1])],
        [([1, 1, 0], [0, 0], [0], [1], False, [1, 1]), ([1, 1, 1], [0, 1], [1], [1], True, [1, 1])],
        [([1, 2, 0], [0, 0], [0], [1], False, [1, 1]), ([1, 2, 1], [0, 1], [1], [1], True, [1, 1])]
    ]
]

